<!DOCTYPE HTML>
<html lang="en" >
    
    <head>
        
        <meta charset="UTF-8">
        <meta http-equiv="X-UA-Compatible" content="IE=edge" />
        <title>Scrapy | 爬虫</title>
        <meta content="text/html; charset=utf-8" http-equiv="Content-Type">
        <meta name="description" content="">
        <meta name="generator" content="GitBook 2.6.7">
        
        
        <meta name="HandheldFriendly" content="true"/>
        <meta name="viewport" content="width=device-width, initial-scale=1, user-scalable=no">
        <meta name="apple-mobile-web-app-capable" content="yes">
        <meta name="apple-mobile-web-app-status-bar-style" content="black">
        <link rel="apple-touch-icon-precomposed" sizes="152x152" href="../gitbook/images/apple-touch-icon-precomposed-152.png">
        <link rel="shortcut icon" href="../gitbook/images/favicon.ico" type="image/x-icon">
        
    <link rel="stylesheet" href="../gitbook/style.css">
    
        
        <link rel="stylesheet" href="../gitbook/plugins/gitbook-plugin-highlight/website.css">
        
    
        
        <link rel="stylesheet" href="../gitbook/plugins/gitbook-plugin-search/search.css">
        
    
        
        <link rel="stylesheet" href="../gitbook/plugins/gitbook-plugin-fontsettings/website.css">
        
    
    

        
    
    
    <link rel="next" href="../scrapy框架/scrapy_setting.html" />
    
    
    <link rel="prev" href="../进程线程协程/threading.html" />
    

        
    </head>
    <body>
        
        
    <div class="book"
        data-level="8"
        data-chapter-title="Scrapy"
        data-filepath="scrapy框架/scrapy.md"
        data-basepath=".."
        data-revision="Fri Oct 19 2018 08:44:08 GMT+0800 (中国标准时间)"
        data-innerlanguage="">
    

<div class="book-summary">
    <nav role="navigation">
        <ul class="summary">
            
            
            
            

            

            
    
        <li class="chapter " data-level="0" data-path="index.html">
            
                
                    <a href="../index.html">
                
                        <i class="fa fa-check"></i>
                        
                        序言
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="1" data-path="认识爬虫/introduceSpider.html">
            
                
                    <a href="../认识爬虫/introduceSpider.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>1.</b>
                        
                        认识爬虫
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="1.1" data-path="认识爬虫/http.html">
            
                
                    <a href="../认识爬虫/http.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>1.1.</b>
                        
                        HTTP
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="1.2" data-path="认识爬虫/Requests.html">
            
                
                    <a href="../认识爬虫/Requests.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>1.2.</b>
                        
                        requests
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="1.3" data-path="认识爬虫/初步爬虫.html">
            
                
                    <a href="../认识爬虫/初步爬虫.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>1.3.</b>
                        
                        初步爬虫小项目
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="2" data-path="正则表达式/正则表达式.html">
            
                
                    <a href="../正则表达式/正则表达式.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.</b>
                        
                        正则表达式
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="2.1" data-path="正则表达式/正则表达式练习.html">
            
                
                    <a href="../正则表达式/正则表达式练习.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.1.</b>
                        
                        正则表达式练习
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="2.2" data-path="正则表达式/正则表达式之后的第一个项目.html">
            
                
                    <a href="../正则表达式/正则表达式之后的第一个项目.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.2.</b>
                        
                        正则表达式之后的第一个项目
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="2.3" data-path="正则表达式/正则表达式常用表.html">
            
                
                    <a href="../正则表达式/正则表达式常用表.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.3.</b>
                        
                        正则表达式常用表
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="2.4" data-path="正则表达式/正则表达式重点1.html">
            
                
                    <a href="../正则表达式/正则表达式重点1.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.4.</b>
                        
                        正则表达式重点
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="2.5" data-path="正则表达式/正则表达式常问问题.html">
            
                
                    <a href="../正则表达式/正则表达式常问问题.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.5.</b>
                        
                        正则表达式常问问题
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="2.6" data-path="正则表达式/正则爬虫练习.html">
            
                
                    <a href="../正则表达式/正则爬虫练习.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.6.</b>
                        
                        正则爬虫项目练习
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="3" data-path="XPATH/xpath-in.html">
            
                
                    <a href="../XPATH/xpath-in.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>3.</b>
                        
                        XPATH
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="3.1" data-path="XPATH/Xpath.html">
            
                
                    <a href="../XPATH/Xpath.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>3.1.</b>
                        
                        XPATH认识
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="3.2" data-path="XPATH/Xpath的代码例子.html">
            
                
                    <a href="../XPATH/Xpath的代码例子.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>3.2.</b>
                        
                        XPATH的代码例子
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="3.3" data-path="XPATH/xpath的爬虫练习.html">
            
                
                    <a href="../XPATH/xpath的爬虫练习.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>3.3.</b>
                        
                        XPATH的爬虫练习
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="4" data-path="BeautifulSoup/BeautifulSoup.html">
            
                
                    <a href="../BeautifulSoup/BeautifulSoup.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>4.</b>
                        
                        BeautifulSoup
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="4.1" data-path="BeautifulSoup/常用的css选择器.html">
            
                
                    <a href="../BeautifulSoup/常用的css选择器.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>4.1.</b>
                        
                        常用的css选择器
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="4.2" data-path="BeautifulSoup/BeautifulSoup4的各种例子.html">
            
                
                    <a href="../BeautifulSoup/BeautifulSoup4的各种例子.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>4.2.</b>
                        
                        BeautifulSoup4的各种例子
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="5" data-path="代理/proxy.html">
            
                
                    <a href="../代理/proxy.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>5.</b>
                        
                        ip代理池项目
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="6" data-path="Selenium/Selenium.html">
            
                
                    <a href="../Selenium/Selenium.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>6.</b>
                        
                        Selenium
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="7" data-path="进程线程协程/introduce.html">
            
                
                    <a href="../进程线程协程/introduce.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.</b>
                        
                        进程线程协程
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="7.1" data-path="进程线程协程/gevent.html">
            
                
                    <a href="../进程线程协程/gevent.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.1.</b>
                        
                        gevent
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="7.2" data-path="进程线程协程/green_let.html">
            
                
                    <a href="../进程线程协程/green_let.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.2.</b>
                        
                        green_let
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="7.3" data-path="进程线程协程/yield.html">
            
                
                    <a href="../进程线程协程/yield.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.3.</b>
                        
                        yield
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="7.4" data-path="进程线程协程/multiprecessing.html">
            
                
                    <a href="../进程线程协程/multiprecessing.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.4.</b>
                        
                        multiprecessing
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="7.5" data-path="进程线程协程/threading.html">
            
                
                    <a href="../进程线程协程/threading.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.5.</b>
                        
                        threading
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter active" data-level="8" data-path="scrapy框架/scrapy.html">
            
                
                    <a href="../scrapy框架/scrapy.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>8.</b>
                        
                        Scrapy
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="8.1" data-path="scrapy框架/scrapy_setting.html">
            
                
                    <a href="../scrapy框架/scrapy_setting.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>8.1.</b>
                        
                        scrapy_setting
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="8.2" data-path="scrapy框架/模块作用.html">
            
                
                    <a href="../scrapy框架/模块作用.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>8.2.</b>
                        
                        模块作用
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="8.3" data-path="scrapy框架/19个中间件.html">
            
                
                    <a href="../scrapy框架/19个中间件.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>8.3.</b>
                        
                        19个中间件
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="9" data-path="scrapy-redis分布式/scrapy-redis.html">
            
                
                    <a href="../scrapy-redis分布式/scrapy-redis.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>9.</b>
                        
                        scrapy-redis分布式
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="9.1" data-path="scrapy-redis分布式/scrapy-redis的改造方法.html">
            
                
                    <a href="../scrapy-redis分布式/scrapy-redis的改造方法.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>9.1.</b>
                        
                        scrapy-redis的改造方法
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="10" data-path="spider_projects/introduce.html">
            
                
                    <a href="../spider_projects/introduce.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.</b>
                        
                        spider_projects
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="10.1" data-path="spider_projects/使用代理在普通爬虫脚本下.html">
            
                
                    <a href="../spider_projects/使用代理在普通爬虫脚本下.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.1.</b>
                        
                        使用代理在普通爬虫脚本下
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.2" data-path="spider_projects/xpath爬取前程无忧的数据.html">
            
                
                    <a href="../spider_projects/xpath爬取前程无忧的数据.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.2.</b>
                        
                        xpath爬取前程无忧的数据
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.3" data-path="spider_projects/存储数据库的脚本.html">
            
                
                    <a href="../spider_projects/存储数据库的脚本.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.3.</b>
                        
                        存储数据库的脚本
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.4" data-path="spider_projects/weibo.html">
            
                
                    <a href="../spider_projects/weibo.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.4.</b>
                        
                        爬取央视新闻微博
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.5" data-path="spider_projects/weibo2.html">
            
                
                    <a href="../spider_projects/weibo2.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.5.</b>
                        
                        爬取明星的微博
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.6" data-path="spider_projects/liepin.html">
            
                
                    <a href="../spider_projects/liepin.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.6.</b>
                        
                        爬取猎聘的职位信息Crawl
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.7" data-path="spider_projects/zhilianRe.html">
            
                
                    <a href="../spider_projects/zhilianRe.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.7.</b>
                        
                        纯正则爬取智联的职位信息
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.8" data-path="spider_projects/setting.html">
            
                
                    <a href="../spider_projects/setting.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.8.</b>
                        
                        scrapy中的setting
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.9" data-path="spider_projects/items.html">
            
                
                    <a href="../spider_projects/items.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.9.</b>
                        
                        scrapy中的items
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.10" data-path="spider_projects/pipeline.html">
            
                
                    <a href="../spider_projects/pipeline.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.10.</b>
                        
                        scrapy中的pipeline
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.11" data-path="spider_projects/middlewares.html">
            
                
                    <a href="../spider_projects/middlewares.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.11.</b>
                        
                        scrapy中的middlewares
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.12" data-path="spider_projects/框架中的代码运行脚本.html">
            
                
                    <a href="../spider_projects/框架中的代码运行脚本.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.12.</b>
                        
                        框架中的代码运行脚本
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="11" data-path="爬虫的面试题/面试题1-10.html">
            
                
                    <a href="../爬虫的面试题/面试题1-10.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>11.</b>
                        
                        爬虫面试题
                    </a>
            
            
        </li>
    


            
            <li class="divider"></li>
            <li>
                <a href="https://www.gitbook.com" target="blank" class="gitbook-link">
                    Published with GitBook
                </a>
            </li>
            
        </ul>
    </nav>
</div>

    <div class="book-body">
        <div class="body-inner">
            <div class="book-header" role="navigation">
    <!-- Actions Left -->
    

    <!-- Title -->
    <h1>
        <i class="fa fa-circle-o-notch fa-spin"></i>
        <a href="../" >爬虫</a>
    </h1>
</div>

            <div class="page-wrapper" tabindex="-1" role="main">
                <div class="page-inner">
                
                
                    <section class="normal" id="section-">
                    
                        <h1 id="scrapy">Scrapy</h1>
<h2 id="scrapy-&#x5B89;&#x88C5;&#x7684;&#x6B65;&#x9AA4;">scrapy &#x5B89;&#x88C5;&#x7684;&#x6B65;&#x9AA4;</h2>
<ol>
<li>pip install scrapy&#xFF08;&#x5982;&#x679C;&#x6210;&#x529F;&#x4E86;&#x5C31;&#x4E0D;&#x5FC5;&#x6267;&#x884C;&#x4E0B;&#x9762;&#x7684;&#x547D;&#x4EE4;&#x4E86;&#xFF09;</li>
<li>pip install wheel</li>
<li>&#x5230;&#x7F51;&#x7AD9;&#x627E;Twisted&#x5305;&#xFF1A; <a href="http://www.lfd.uci.edu/~gohlke/pythonlibs/" target="_blank">http://www.lfd.uci.edu/~gohlke/pythonlibs/</a></li>
<li>&#x5B89;&#x88C5;&#x4E0B;&#x8F7D;&#x7684;&#x90A3;&#x4E2A;&#x5305;&#xFF1A;pip install E:\12&#x671F;\&#x8BFE;&#x4E0A;&#x4EE3;&#x7801;\Day6\twsted_pakage\Twisted-18.7.0-cp35-cp35m-win_amd64.
whl</li>
<li>&#x6700;&#x540E;&#x518D;&#x53BB;&#x5B89;&#x88C5; pip install scrapy</li>
</ol>
<hr>
<h2 id="&#x521B;&#x5EFA;scrapy&#x7684;&#x722C;&#x866B;&#x7684;&#x547D;&#x4EE4;">&#x521B;&#x5EFA;scrapy&#x7684;&#x722C;&#x866B;&#x7684;&#x547D;&#x4EE4;</h2>
<ol>
<li><p>scrapy startproject Tuesday</p>
</li>
<li><p>cd Tuesday
&#x4F8B;&#x5B50;&#xFF1A;</p>
</li>
<li>scrapy genspider jobbole jobbole.com</li>
</ol>
<hr>
<ol>
<li>&#x9700;&#x8981;&#x6709;&#x7684;&#x90A3;&#x4E2A;url&#x548C;&#x5B83;&#x6240;&#x5BF9;&#x5E94;&#x7684;&#x51FD;&#x6570;&#xFF0C; &#x5BF9;&#x5E94;&#x5230;scrapy&#x4E2D;&#x5C31;&#x662F;spiders&#x6587;&#x4EF6;&#x5185;&#x9700;&#x8981;&#x5199;&#x7684;&#x5185;&#x5BB9;</li>
<li>&#x9700;&#x8981;&#x6709;&#x5B58;&#x50A8;&#x6570;&#x636E;&#x7684;&#x51FD;&#x6570;&#xFF0C;&#x4EE3;&#x7801;&#xFF0C;&#x6BD4;&#x5982;&#x9700;&#x8981;&#x5B58;&#x5165;mysql&#xFF0C; &#x8FD9;&#x6837;&#x7684;&#x5BF9;&#x4E8E;&#x9700;&#x8981;&#x5B58;&#x50A8;&#x7684;&#x6570;&#x636E;&#x7684;&#x4EE3;&#x7801;&#x5C31;&#x5E94;&#x8BE5;&#x5199;&#x5728;Item Pipeline</li>
<li>&#x6211;&#x4EEC;&#x751F;&#x6210;&#x7684;url&#x548C;&#x5BF9;&#x5E94;&#x51FD;&#x6570;&#x9700;&#x8981;&#x6709;&#x4E00;&#x4E2A;&#x961F;&#x5217;&#x8FDB;&#x884C;&#x5B58;&#x50A8;&#x5E76;&#x4E14;&#x540E;&#x7EED;&#x53BB;&#x4E0B;&#x8F7D;&#xFF0C;&#x8FD9;&#x4E2A;&#x529F;&#x80FD;&#x5728;scrapy&#x4E2D;&#x5C31;&#x5BF9;&#x5E94;&#x7740;Scheduler</li>
<li>&#x6211;&#x4EEC;&#x9700;&#x8981;&#x6709;&#x4E00;&#x4E2A;&#x529F;&#x80FD;&#x53BB;&#x4E0B;&#x8F7D;url&#x6240;&#x5BF9;&#x5E94;&#x7684;response&#xFF0C;&#x8FD9;&#x4E2A;&#x529F;&#x80FD;&#x5BF9;&#x5E94;&#x5230;scrapy&#x4E2D;&#x5C31;&#x662F;Downloader</li>
</ol>
<p><img src="images/scrapy.png" alt="scrapy"></p>
<p>&#x722C;&#x866B;&#x7684;&#x4E94;&#x4E2A;&#x6B65;&#x9AA4;:</p>
<ol>
<li>&#x9700;&#x6C42;</li>
<li>&#x627E;&#x5230;&#x9700;&#x8981;&#x7684;URL</li>
<li>&#x4E0B;&#x8F7D;url&#x5BF9;&#x5E94;&#x7684;&#x4FE1;&#x606F;(Downloader)</li>
<li>&#x89E3;&#x6790;&#x8FD9;&#x4E9B;&#x4FE1;&#x606F;, &#x83B7;&#x53D6;&#x7279;&#x5B9A;&#x7684;&#x4FE1;&#x606F;(spiders)</li>
<li>&#x5B58;&#x50A8;&#x8FD9;&#x4E9B;&#x4FE1;&#x606F;(ItemPipeline)</li>
</ol>
<p>&#x7279;&#x6B8A;&#x7684;&#x662F;, schedule.</p>
<p>&#x56E0;&#x4E3A;&#x662F;&#x5206;&#x5E03;&#x5F0F;, &#x6211;&#x4EEC;&#x4E4B;&#x524D;&#x4E5F;&#x8BB2;&#x8FC7;, &#x4F1A;&#x7528;&#x5230;&#x4E00;&#x4E2A;&#x961F;&#x5217;&#x5B58;&#x50A8;&#x5F85;&#x5904;&#x7406;&#x7684;URL. &#x6240;&#x4EE5;Schedule&#x5C31;&#x662F;: &#x961F;&#x5217;&#x7684;&#x7BA1;&#x7406;&#x5668;</p>
<p><img src="images/scrapy_data.png" alt="&#x6846;&#x67B6;"></p>
<hr>
<h3 id="&#x67B6;&#x6784;&#x6570;&#x636E;&#x6D41;&#x7A0B;&#xFF1A;">&#x67B6;&#x6784;&#x6570;&#x636E;&#x6D41;&#x7A0B;&#xFF1A;</h3>
<ol>
<li>spiders &#x9700;&#x8981;&#x6709;&#x521D;&#x59CB;&#x7684; start_url &#x6216;&#x8005;&#x662F; &#x51FD;&#x6570; start_requests, &#x4F1A;&#x5728;&#x5185;&#x90E8;&#x751F;&#x6210;Request&#x7ED9;&#x5230;Engine</li>
</ol>
<ol>
<li>Engine&#x4F1A;&#x5C06;&#x521D;&#x59CB;&#x7684;Request&#x53D1;&#x9001;&#x7ED9;Scheduler&#xFF0C; Engine&#x4E5F;&#x4F1A;&#x4ECE;scheduler&#x4E2D;&#x83B7;&#x53D6;request&#x4EE5;&#x4FBF;&#x4EA4;&#x7ED9;downloader&#x4E0B;&#x8F7D;&#x3002;</li>
</ol>
<ol>
<li>Engine&#x5C31;&#x5F97;&#x5230;&#x4E86;Request</li>
</ol>
<ol>
<li>Engine&#x4F1A;&#x5C06;Request&#x53D1;&#x9001;&#x7ED9;downloader&#x4E0B;&#x8F7D;&#xFF0C;&#x5728;&#x8FD9;&#x4E2A;&#x8FC7;&#x7A0B;&#x4E2D;&#xFF0C;&#x4F1A;&#x7ECF;&#x8FC7;Downloader Middlewares&#xFF08;&#x4F1A;&#x7ECF;&#x8FC7;&#x51FD;&#x6570;&#xFF0C;process_request&#xFF09;</li>
</ol>
<ol>
<li>downloader &#x5C31;&#x4F1A;&#x53BB;&#x4E0B;&#x8F7D;&#x9875;&#x9762;&#xFF0C; &#x4E0B;&#x8F7D;&#x7ED3;&#x675F;&#x540E;&#x4F1A;&#x751F;&#x6210;&#x4E00;&#x4E2A;response&#xFF0C;&#x8FD9;&#x4E2A;response&#x4F1A;&#x8FD4;&#x56DE;&#x7ED9;engine&#xFF0C;&#x7136;&#x540E;&#x8FD9;&#x4E2A;&#x8FC7;&#x7A0B;&#x4E2D;&#x4F1A;&#x7ECF;&#x8FC7; Downloader Middlewares&#x3002;&#xFF08;&#x4F1A;&#x7ECF;&#x8FC7;process response&#xFF09;&#xFF0C;&#x8FD9;&#x4E2A;&#x8FC7;&#x7A0B;&#x4E2D;&#xFF0C;&#x6709;&#x53EF;&#x80FD;&#x4F1A;&#x51FA;&#x9519;&#xFF0C;&#x4F1A;&#x8D70;&#x7684;&#x51FD;&#x6570;&#x53EB;&#x505A;&#xFF08;process_exception&#xFF09;</li>
</ol>
<ol>
<li><p>Engine &#x4ECE;downloader&#x83B7;&#x53D6;&#x5230;response&#x4E4B;&#x540E;&#xFF0C;&#x5C31;&#x4F1A;&#x5C06;&#x8FD9;&#x4E2A;response&#x8FD4;&#x56DE;&#x7ED9;spiders&#xFF0C;spiders&#x4F1A;&#x7EE7;&#x7EED;&#x5904;&#x7406;&#x5B83;&#x3002;&#x8FD9;&#x4E2A;&#x8FC7;&#x7A0B;&#x4E2D;&#xFF0C; response&#x4F1A;&#x7ECF;&#x8FC7;spider middlewares,(process_spider_input)</p>
</li>
<li><p>spiders &#x5904;&#x7406;&#x8FD9;&#x4E2A;response&#xFF0C;&#x4F1A;&#x6709;&#x4E24;&#x79CD;&#x8FD4;&#x56DE;&#x65B9;&#x5F0F;&#xFF0C;&#x7B2C;&#x4E00;&#x79CD;&#x8FD4;&#x56DE;Request&#xFF0C;&#x7B2C;&#x4E8C;&#x79CD;&#x8FD4;&#x56DE;&#x7684;&#x662F;item&#x3002;&#x8FD9;&#x4E24;&#x6837;&#x8FD4;&#x56DE;&#x90FD;&#x4F1A;&#x7ED9;&#x5230; engine&#xFF0C;&#x8FD9;&#x4E2A;&#x8FC7;&#x7A0B;&#x4E2D;&#x5C31;&#x4F1A;&#x7ECF;&#x8FC7;spider middlewares&#xFF08;&#x8FD9;&#x4E2A;&#x51FD;&#x6570;&#x5C31;&#x53EB;process_spider_output&#xFF09;</p>
</li>
<li><p>engine &#x4F1A;&#x6839;&#x636E;&#x8FD4;&#x56DE;&#x7684;&#x7C7B;&#x578B;&#x505A;&#x64CD;&#x4F5C;&#xFF0C; &#x5982;&#x679C;&#x662F;item&#xFF0C;&#x5C31;&#x5C06;&#x8FD9;&#x4E2A;&#x7C7B;&#x53D1;&#x9001;&#x5230;Item Pipeline &#x4E2D;&#x3002;&#x5982;&#x679C;&#x662F;Request&#xFF0C;&#x7EE7;&#x7EED;&#x53D1;&#x9001;&#x5230;sheduler&#x4E2D;&#x3002;&#x7EE7;&#x7EED;&#x722C;&#x866B;&#x3002;</p>
</li>
<li><p>&#x91CD;&#x590D;&#x7B2C;&#x4E00;&#x6B65;&#x7684;&#x5185;&#x5BB9;&#xFF0C;&#x76F4;&#x5230;&#x6CA1;&#x6709;&#x4EFB;&#x4F55;&#x9700;&#x8981;&#x722C;&#x53D6;&#x7684;&#x6570;&#x636E;&#x3002;</p>
</li>
</ol>

                    
                    </section>
                
                
                </div>
            </div>
        </div>

        
        <a href="../进程线程协程/threading.html" class="navigation navigation-prev " aria-label="Previous page: threading"><i class="fa fa-angle-left"></i></a>
        
        
        <a href="../scrapy框架/scrapy_setting.html" class="navigation navigation-next " aria-label="Next page: scrapy_setting"><i class="fa fa-angle-right"></i></a>
        
    </div>
</div>

        
<script src="../gitbook/app.js"></script>

    
    <script src="../gitbook/plugins/gitbook-plugin-search/lunr.min.js"></script>
    

    
    <script src="../gitbook/plugins/gitbook-plugin-search/search.js"></script>
    

    
    <script src="../gitbook/plugins/gitbook-plugin-sharing/buttons.js"></script>
    

    
    <script src="../gitbook/plugins/gitbook-plugin-fontsettings/buttons.js"></script>
    

<script>
require(["gitbook"], function(gitbook) {
    var config = {"highlight":{},"search":{"maxIndexSize":1000000},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"fontsettings":{"theme":"white","family":"sans","size":2}};
    gitbook.start(config);
});
</script>

        
    </body>
    
</html>
